<!DOCTYPE html>



  


<html class="theme-next mist use-motion" lang="zh-cn">
<head>
  <meta charset="UTF-8"/>
<meta http-equiv="X-UA-Compatible" content="IE=edge" />
<meta name="viewport" content="width=device-width, initial-scale=1, maximum-scale=1"/>
<meta name="theme-color" content="#222">









<meta http-equiv="Cache-Control" content="no-transform" />
<meta http-equiv="Cache-Control" content="no-siteapp" />
















  
  
  <link href="/lib/fancybox/source/jquery.fancybox.css?v=2.1.5" rel="stylesheet" type="text/css" />







<link href="/lib/font-awesome/css/font-awesome.min.css?v=4.6.2" rel="stylesheet" type="text/css" />

<link href="/css/main.css?v=5.1.4" rel="stylesheet" type="text/css" />


  <link rel="apple-touch-icon" sizes="180x180" href="/images/apple-touch-icon-next.png?v=5.1.4">


  <link rel="icon" type="image/png" sizes="32x32" href="/images/favicon-32x32-next.png?v=5.1.4">


  <link rel="icon" type="image/png" sizes="16x16" href="/images/favicon-16x16-next.png?v=5.1.4">


  <link rel="mask-icon" href="/images/logo.svg?v=5.1.4" color="#222">





  <meta name="keywords" content="贝叶斯," />










<meta name="description" content="简述：基于概率论的分类方法 :朴素贝叶斯 通过分析7000个人的名字，分别计算男女名字中含有某个的概率， 如果男孩子名字的概率大于女孩子的，则判断结果为男孩子。">
<meta property="og:type" content="article">
<meta property="og:title" content="输入名字识别男女开发全过程附实例">
<meta property="og:url" content="https://blog.sunan.me/2019/04/25/boy-or-girl/index.html">
<meta property="og:site_name" content="苏南的博客">
<meta property="og:description" content="简述：基于概率论的分类方法 :朴素贝叶斯 通过分析7000个人的名字，分别计算男女名字中含有某个的概率， 如果男孩子名字的概率大于女孩子的，则判断结果为男孩子。">
<meta property="og:locale" content="zh_CN">
<meta property="article:published_time" content="2019-04-25T04:00:00.000Z">
<meta property="article:modified_time" content="2020-03-21T08:15:56.898Z">
<meta property="article:author" content="Mofeng">
<meta property="article:tag" content="贝叶斯">
<meta name="twitter:card" content="summary">



<script type="text/javascript" id="hexo.configurations">
  var NexT = window.NexT || {};
  var CONFIG = {
    root: '/',
    scheme: 'Mist',
    version: '5.1.4',
    sidebar: {"position":"left","display":"post","offset":12,"b2t":false,"scrollpercent":false,"onmobile":false},
    fancybox: true,
    tabs: true,
    motion: {"enable":true,"async":false,"transition":{"post_block":"fadeIn","post_header":"slideDownIn","post_body":"slideDownIn","coll_header":"slideLeftIn","sidebar":"slideUpIn"}},
    duoshuo: {
      userId: '0',
      author: 'Author'
    },
    algolia: {
      applicationID: '',
      apiKey: '',
      indexName: '',
      hits: {"per_page":10},
      labels: {"input_placeholder":"Search for Posts","hits_empty":"We didn't find any results for the search: ${query}","hits_stats":"${hits} results found in ${time} ms"}
    }
  };
</script>



  <link rel="canonical" href="https://blog.sunan.me/2019/04/25/boy-or-girl/"/>





  <title>输入名字识别男女开发全过程附实例 | 苏南的博客</title>
  








<meta name="generator" content="Hexo 4.2.0"></head>

<body itemscope itemtype="http://schema.org/WebPage" lang="zh-cn">

  
  
    
  

  <div class="container sidebar-position-left page-post-detail">
    <div class="headband"></div>

    <header id="header" class="header" itemscope itemtype="http://schema.org/WPHeader">
      <div class="header-inner"><div class="site-brand-wrapper">
  <div class="site-meta ">
    

    <div class="custom-logo-site-title">
      <a href="/"  class="brand" rel="start">
        <span class="logo-line-before"><i></i></span>
        <span class="site-title">苏南的博客</span>
        <span class="logo-line-after"><i></i></span>
      </a>
    </div>
      
        <p class="site-subtitle"></p>
      
  </div>

  <div class="site-nav-toggle">
    <button>
      <span class="btn-bar"></span>
      <span class="btn-bar"></span>
      <span class="btn-bar"></span>
    </button>
  </div>
</div>

<nav class="site-nav">
  

  
    <ul id="menu" class="menu">
      
        
        <li class="menu-item menu-item-home">
          <a href="/" rel="section">
            
              <i class="menu-item-icon fa fa-fw fa-home"></i> <br />
            
            Home
          </a>
        </li>
      
        
        <li class="menu-item menu-item-archives">
          <a href="/archives/" rel="section">
            
              <i class="menu-item-icon fa fa-fw fa-archive"></i> <br />
            
            Archives
          </a>
        </li>
      
        
        <li class="menu-item menu-item-about">
          <a href="/about/" rel="section">
            
              <i class="menu-item-icon fa fa-fw fa-user"></i> <br />
            
            About
          </a>
        </li>
      
        
        <li class="menu-item menu-item-主站">
          <a href="https://sunan.me" target="_blank" rel="section noopener">
            
              <i class="menu-item-icon fa fa-fw fa-home"></i> <br />
            
            主站
          </a>
        </li>
      

      
    </ul>
  

  
</nav>



 </div>
    </header>

    <main id="main" class="main">
      <div class="main-inner">
        <div class="content-wrap">
          <div id="content" class="content">
            

  <div id="posts" class="posts-expand">
    

  

  
  
  

  <article class="post post-type-normal" itemscope itemtype="http://schema.org/Article">
  
  
  
  <div class="post-block">
    <link itemprop="mainEntityOfPage" href="https://blog.sunan.me/2019/04/25/boy-or-girl/">

    <span hidden itemprop="author" itemscope itemtype="http://schema.org/Person">
      <meta itemprop="name" content="Mofeng">
      <meta itemprop="description" content="">
      <meta itemprop="image" content="/images/avatar.gif">
    </span>

    <span hidden itemprop="publisher" itemscope itemtype="http://schema.org/Organization">
      <meta itemprop="name" content="苏南的博客">
    </span>

    
      <header class="post-header">

        
        
          <h1 class="post-title" itemprop="name headline">输入名字识别男女开发全过程附实例</h1>
        

        <div class="post-meta">
          <span class="post-time">
            
              <span class="post-meta-item-icon">
                <i class="fa fa-calendar-o"></i>
              </span>
              
                <span class="post-meta-item-text">Posted on</span>
              
              <time title="Post created" itemprop="dateCreated datePublished" datetime="2019-04-25T12:00:00+08:00">
                2019-04-25
              </time>
            

            

            
          </span>

          
            <span class="post-category" >
            
              <span class="post-meta-divider">|</span>
            
              <span class="post-meta-item-icon">
                <i class="fa fa-folder-o"></i>
              </span>
              
                <span class="post-meta-item-text">In</span>
              
              
                <span itemprop="about" itemscope itemtype="http://schema.org/Thing">
                  <a href="/categories/%E6%9C%BA%E5%99%A8%E5%AD%A6%E4%B9%A0/" itemprop="url" rel="index">
                    <span itemprop="name">机器学习</span>
                  </a>
                </span>

                
                
              
            </span>
          

          
            
          

          
          

          

          

          

        </div>
      </header>
    

    
    
    
    <div class="post-body" itemprop="articleBody">

      
      

      
        <h3 id="简述："><a href="#简述：" class="headerlink" title="简述："></a>简述：</h3><p>基于概率论的分类方法 <strong>:朴素贝叶斯</strong></p>
<p>通过分析7000个人的名字，分别计算男女名字中含有某个的概率，</p>
<p>如果男孩子名字的概率大于女孩子的，则判断结果为男孩子。</p>
<a id="more"></a>

<h3 id="算法部分"><a href="#算法部分" class="headerlink" title="算法部分"></a>算法部分</h3><h4 id="从数据库中读取名字和性别"><a href="#从数据库中读取名字和性别" class="headerlink" title="从数据库中读取名字和性别"></a>从数据库中读取名字和性别</h4><figure class="highlight python"><table><tr><td class="gutter"><pre><span class="line">1</span><br><span class="line">2</span><br><span class="line">3</span><br><span class="line">4</span><br><span class="line">5</span><br><span class="line">6</span><br><span class="line">7</span><br><span class="line">8</span><br><span class="line">9</span><br><span class="line">10</span><br><span class="line">11</span><br><span class="line">12</span><br><span class="line">13</span><br><span class="line">14</span><br><span class="line">15</span><br><span class="line">16</span><br><span class="line">17</span><br><span class="line">18</span><br><span class="line">19</span><br><span class="line">20</span><br><span class="line">21</span><br><span class="line">22</span><br><span class="line">23</span><br><span class="line">24</span><br><span class="line">25</span><br><span class="line">26</span><br><span class="line">27</span><br><span class="line">28</span><br><span class="line">29</span><br></pre></td><td class="code"><pre><span class="line"><span class="comment"># 从数据库中读取名字和性别</span></span><br><span class="line"><span class="comment"># 训练集数据为7000</span></span><br><span class="line"><span class="function"><span class="keyword">def</span> <span class="title">input_name</span><span class="params">()</span>:</span></span><br><span class="line">    <span class="comment"># 连接数据库</span></span><br><span class="line">    conn = pymysql.connect(host=<span class="string">'localhost'</span>, port=<span class="number">3306</span>, user=<span class="string">'root'</span>, db=<span class="string">'person_name'</span>, charset=<span class="string">'utf8'</span>)</span><br><span class="line">    cursor = conn.cursor()</span><br><span class="line">    <span class="comment"># 读取数据</span></span><br><span class="line">    cursor.execute(<span class="string">"SELECT * FROM student"</span>)</span><br><span class="line">    names_data = cursor.fetchmany(<span class="number">7000</span>)</span><br><span class="line">    <span class="comment"># 分类男女数据</span></span><br><span class="line">    boy_str = <span class="string">''</span></span><br><span class="line">    girl_str = <span class="string">''</span></span><br><span class="line">    <span class="keyword">for</span> i <span class="keyword">in</span> names_data:</span><br><span class="line">        <span class="comment"># 去除姓分别拼接所有名字为字符串</span></span><br><span class="line">        <span class="keyword">if</span> i[<span class="number">2</span>] == <span class="string">'男'</span>:</span><br><span class="line">            boy_str = boy_str + i[<span class="number">1</span>][<span class="number">1</span>:<span class="number">3</span>]</span><br><span class="line">        <span class="keyword">else</span>:</span><br><span class="line">            girl_str = girl_str + i[<span class="number">1</span>][<span class="number">1</span>:<span class="number">3</span>]</span><br><span class="line">    <span class="comment"># 保存为字典类型并返回</span></span><br><span class="line">    sex_data = &#123;<span class="string">'男'</span>: boy_str,</span><br><span class="line">                <span class="string">'女'</span>: girl_str</span><br><span class="line">                &#125;</span><br><span class="line">    <span class="comment"># 提交，不然无法保存新建或者修改的数据</span></span><br><span class="line">    conn.commit()</span><br><span class="line">    <span class="comment"># 关闭游标</span></span><br><span class="line">    cursor.close()</span><br><span class="line">    <span class="comment"># 关闭连接</span></span><br><span class="line">    conn.close()</span><br><span class="line">    <span class="keyword">return</span> sex_data</span><br></pre></td></tr></table></figure>
<h4 id="计算字符概率"><a href="#计算字符概率" class="headerlink" title="计算字符概率"></a>计算字符概率</h4><figure class="highlight python"><table><tr><td class="gutter"><pre><span class="line">1</span><br><span class="line">2</span><br><span class="line">3</span><br><span class="line">4</span><br><span class="line">5</span><br><span class="line">6</span><br><span class="line">7</span><br><span class="line">8</span><br><span class="line">9</span><br><span class="line">10</span><br><span class="line">11</span><br><span class="line">12</span><br><span class="line">13</span><br><span class="line">14</span><br></pre></td><td class="code"><pre><span class="line"><span class="comment"># 计算字符概率</span></span><br><span class="line"><span class="function"><span class="keyword">def</span> <span class="title">probability</span><span class="params">(words)</span>:</span></span><br><span class="line">    d = &#123;&#125;</span><br><span class="line">    <span class="comment"># 统计出现的字符个数</span></span><br><span class="line">    <span class="keyword">for</span> x <span class="keyword">in</span> words:</span><br><span class="line">        <span class="keyword">if</span> x <span class="keyword">in</span> d:</span><br><span class="line">            d[x] = d[x] + <span class="number">1</span></span><br><span class="line">        <span class="keyword">else</span>:</span><br><span class="line">            d[x] = <span class="number">1</span></span><br><span class="line">    <span class="comment"># 计算字符出现概率</span></span><br><span class="line">    word_probability = &#123;&#125;</span><br><span class="line">    <span class="keyword">for</span> i <span class="keyword">in</span> d:</span><br><span class="line">        word_probability[i] = d[i] / <span class="number">7000</span></span><br><span class="line">    <span class="keyword">return</span> word_probability</span><br></pre></td></tr></table></figure>

<h4 id="概率数据存入数据库"><a href="#概率数据存入数据库" class="headerlink" title="概率数据存入数据库"></a>概率数据存入数据库</h4><figure class="highlight python"><table><tr><td class="gutter"><pre><span class="line">1</span><br><span class="line">2</span><br><span class="line">3</span><br><span class="line">4</span><br><span class="line">5</span><br><span class="line">6</span><br><span class="line">7</span><br><span class="line">8</span><br><span class="line">9</span><br><span class="line">10</span><br><span class="line">11</span><br><span class="line">12</span><br><span class="line">13</span><br><span class="line">14</span><br><span class="line">15</span><br><span class="line">16</span><br><span class="line">17</span><br><span class="line">18</span><br><span class="line">19</span><br><span class="line">20</span><br><span class="line">21</span><br></pre></td><td class="code"><pre><span class="line"><span class="comment"># 概率数据存入数据库</span></span><br><span class="line"><span class="function"><span class="keyword">def</span> <span class="title">save_mysql</span><span class="params">(word_data, sex)</span>:</span></span><br><span class="line">    <span class="comment"># 连接数据库</span></span><br><span class="line">    conn = pymysql.connect(host=<span class="string">'localhost'</span>, port=<span class="number">3306</span>, user=<span class="string">'root'</span>, db=<span class="string">'person_name'</span>, charset=<span class="string">'utf8'</span>)</span><br><span class="line">    cursor = conn.cursor()</span><br><span class="line">    <span class="keyword">if</span> sex == <span class="string">'男'</span>:</span><br><span class="line">        <span class="comment"># 循环存入数据</span></span><br><span class="line">        sql = <span class="string">"INSERT INTO boy (word,probability) VALUES (%s,%s)"</span></span><br><span class="line">        <span class="keyword">for</span> i <span class="keyword">in</span> word_data:</span><br><span class="line">            cursor.execute(sql, (i, word_data[i]))</span><br><span class="line">    <span class="keyword">else</span>:</span><br><span class="line">        <span class="comment"># 循环存入数据</span></span><br><span class="line">        sql = <span class="string">"INSERT INTO girl (word,probability) VALUES (%s,%s)"</span></span><br><span class="line">        <span class="keyword">for</span> i <span class="keyword">in</span> word_data:</span><br><span class="line">            cursor.execute(sql, (i, word_data[i]))</span><br><span class="line">    <span class="comment"># 提交，不然无法保存新建或者修改的数据</span></span><br><span class="line">    conn.commit()</span><br><span class="line">    <span class="comment"># 关闭游标</span></span><br><span class="line">    cursor.close()</span><br><span class="line">    <span class="comment"># 关闭连接</span></span><br><span class="line">    conn.close()</span><br></pre></td></tr></table></figure>

<h3 id="训练部分完整代码"><a href="#训练部分完整代码" class="headerlink" title="训练部分完整代码"></a>训练部分完整代码</h3><figure class="highlight python"><table><tr><td class="gutter"><pre><span class="line">1</span><br><span class="line">2</span><br><span class="line">3</span><br><span class="line">4</span><br><span class="line">5</span><br><span class="line">6</span><br><span class="line">7</span><br><span class="line">8</span><br><span class="line">9</span><br><span class="line">10</span><br><span class="line">11</span><br><span class="line">12</span><br><span class="line">13</span><br><span class="line">14</span><br><span class="line">15</span><br><span class="line">16</span><br><span class="line">17</span><br><span class="line">18</span><br><span class="line">19</span><br><span class="line">20</span><br><span class="line">21</span><br><span class="line">22</span><br><span class="line">23</span><br><span class="line">24</span><br><span class="line">25</span><br><span class="line">26</span><br><span class="line">27</span><br><span class="line">28</span><br><span class="line">29</span><br><span class="line">30</span><br><span class="line">31</span><br><span class="line">32</span><br><span class="line">33</span><br><span class="line">34</span><br><span class="line">35</span><br><span class="line">36</span><br><span class="line">37</span><br><span class="line">38</span><br><span class="line">39</span><br><span class="line">40</span><br><span class="line">41</span><br><span class="line">42</span><br><span class="line">43</span><br><span class="line">44</span><br><span class="line">45</span><br><span class="line">46</span><br><span class="line">47</span><br><span class="line">48</span><br><span class="line">49</span><br><span class="line">50</span><br><span class="line">51</span><br><span class="line">52</span><br><span class="line">53</span><br><span class="line">54</span><br><span class="line">55</span><br><span class="line">56</span><br><span class="line">57</span><br><span class="line">58</span><br><span class="line">59</span><br><span class="line">60</span><br><span class="line">61</span><br><span class="line">62</span><br><span class="line">63</span><br><span class="line">64</span><br><span class="line">65</span><br><span class="line">66</span><br><span class="line">67</span><br><span class="line">68</span><br><span class="line">69</span><br><span class="line">70</span><br><span class="line">71</span><br><span class="line">72</span><br><span class="line">73</span><br><span class="line">74</span><br><span class="line">75</span><br><span class="line">76</span><br><span class="line">77</span><br><span class="line">78</span><br><span class="line">79</span><br><span class="line">80</span><br><span class="line">81</span><br><span class="line">82</span><br></pre></td><td class="code"><pre><span class="line"><span class="keyword">import</span> pymysql</span><br><span class="line"> </span><br><span class="line"> </span><br><span class="line"><span class="comment"># 计算字符概率</span></span><br><span class="line"><span class="function"><span class="keyword">def</span> <span class="title">probability</span><span class="params">(words)</span>:</span></span><br><span class="line">    d = &#123;&#125;</span><br><span class="line">    <span class="comment"># 统计出现的字符个数</span></span><br><span class="line">    <span class="keyword">for</span> x <span class="keyword">in</span> words:</span><br><span class="line">        <span class="keyword">if</span> x <span class="keyword">in</span> d:</span><br><span class="line">            d[x] = d[x] + <span class="number">1</span></span><br><span class="line">        <span class="keyword">else</span>:</span><br><span class="line">            d[x] = <span class="number">1</span></span><br><span class="line">    <span class="comment"># 计算字符出现概率</span></span><br><span class="line">    word_probability = &#123;&#125;</span><br><span class="line">    <span class="keyword">for</span> i <span class="keyword">in</span> d:</span><br><span class="line">        word_probability[i] = d[i] / <span class="number">7000</span></span><br><span class="line">    <span class="keyword">return</span> word_probability</span><br><span class="line"> </span><br><span class="line"> </span><br><span class="line"><span class="comment"># 从数据库中读取名字和性别</span></span><br><span class="line"><span class="comment"># 训练集数据为7000</span></span><br><span class="line"><span class="function"><span class="keyword">def</span> <span class="title">input_name</span><span class="params">()</span>:</span></span><br><span class="line">    <span class="comment"># 连接数据库</span></span><br><span class="line">    conn = pymysql.connect(host=<span class="string">'localhost'</span>, port=<span class="number">3306</span>, user=<span class="string">'root'</span>, db=<span class="string">'person_name'</span>, charset=<span class="string">'utf8'</span>)</span><br><span class="line">    cursor = conn.cursor()</span><br><span class="line">    <span class="comment"># 读取数据</span></span><br><span class="line">    cursor.execute(<span class="string">"SELECT * FROM student"</span>)</span><br><span class="line">    names_data = cursor.fetchmany(<span class="number">7000</span>)</span><br><span class="line">    <span class="comment"># 分类男女数据</span></span><br><span class="line">    boy_str = <span class="string">''</span></span><br><span class="line">    girl_str = <span class="string">''</span></span><br><span class="line">    <span class="keyword">for</span> i <span class="keyword">in</span> names_data:</span><br><span class="line">        <span class="comment"># 去除姓分别拼接所有名字为字符串</span></span><br><span class="line">        <span class="keyword">if</span> i[<span class="number">2</span>] == <span class="string">'男'</span>:</span><br><span class="line">            boy_str = boy_str + i[<span class="number">1</span>][<span class="number">1</span>:<span class="number">3</span>]</span><br><span class="line">        <span class="keyword">else</span>:</span><br><span class="line">            girl_str = girl_str + i[<span class="number">1</span>][<span class="number">1</span>:<span class="number">3</span>]</span><br><span class="line">    <span class="comment"># 保存为字典类型并返回</span></span><br><span class="line">    sex_data = &#123;<span class="string">'男'</span>: boy_str,</span><br><span class="line">                <span class="string">'女'</span>: girl_str</span><br><span class="line">                &#125;</span><br><span class="line">    <span class="comment"># 提交，不然无法保存新建或者修改的数据</span></span><br><span class="line">    conn.commit()</span><br><span class="line">    <span class="comment"># 关闭游标</span></span><br><span class="line">    cursor.close()</span><br><span class="line">    <span class="comment"># 关闭连接</span></span><br><span class="line">    conn.close()</span><br><span class="line">    <span class="keyword">return</span> sex_data</span><br><span class="line"> </span><br><span class="line"> </span><br><span class="line"><span class="comment"># 概率数据存入数据库</span></span><br><span class="line"><span class="function"><span class="keyword">def</span> <span class="title">save_mysql</span><span class="params">(word_data, sex)</span>:</span></span><br><span class="line">    <span class="comment"># 连接数据库</span></span><br><span class="line">    conn = pymysql.connect(host=<span class="string">'localhost'</span>, port=<span class="number">3306</span>, user=<span class="string">'root'</span>, db=<span class="string">'person_name'</span>, charset=<span class="string">'utf8'</span>)</span><br><span class="line">    cursor = conn.cursor()</span><br><span class="line">    <span class="keyword">if</span> sex == <span class="string">'男'</span>:</span><br><span class="line">        <span class="comment"># 循环存入数据</span></span><br><span class="line">        sql = <span class="string">"INSERT INTO boy (word,probability) VALUES (%s,%s)"</span></span><br><span class="line">        <span class="keyword">for</span> i <span class="keyword">in</span> word_data:</span><br><span class="line">            cursor.execute(sql, (i, word_data[i]))</span><br><span class="line">    <span class="keyword">else</span>:</span><br><span class="line">        <span class="comment"># 循环存入数据</span></span><br><span class="line">        sql = <span class="string">"INSERT INTO girl (word,probability) VALUES (%s,%s)"</span></span><br><span class="line">        <span class="keyword">for</span> i <span class="keyword">in</span> word_data:</span><br><span class="line">            cursor.execute(sql, (i, word_data[i]))</span><br><span class="line">    <span class="comment"># 提交，不然无法保存新建或者修改的数据</span></span><br><span class="line">    conn.commit()</span><br><span class="line">    <span class="comment"># 关闭游标</span></span><br><span class="line">    cursor.close()</span><br><span class="line">    <span class="comment"># 关闭连接</span></span><br><span class="line">    conn.close()</span><br><span class="line"> </span><br><span class="line"> </span><br><span class="line"><span class="keyword">if</span> __name__ == <span class="string">'__main__'</span>:</span><br><span class="line">    <span class="comment"># 获取训练数据集</span></span><br><span class="line">    name_data = input_name()</span><br><span class="line">    <span class="comment"># 统计男孩名字名字出现字的概率</span></span><br><span class="line">    boy_probability = probability(name_data[<span class="string">'男'</span>])</span><br><span class="line">    girl_probability = probability(name_data[<span class="string">'女'</span>])</span><br><span class="line">    <span class="comment"># 存入数据库</span></span><br><span class="line">    save_mysql(boy_probability, <span class="string">'男'</span>)</span><br><span class="line">    save_mysql(girl_probability, <span class="string">'女'</span>)</span><br></pre></td></tr></table></figure>



<h3 id="应用部分完整代码"><a href="#应用部分完整代码" class="headerlink" title="应用部分完整代码"></a>应用部分完整代码</h3><figure class="highlight python"><table><tr><td class="gutter"><pre><span class="line">1</span><br><span class="line">2</span><br><span class="line">3</span><br><span class="line">4</span><br><span class="line">5</span><br><span class="line">6</span><br><span class="line">7</span><br><span class="line">8</span><br><span class="line">9</span><br><span class="line">10</span><br><span class="line">11</span><br><span class="line">12</span><br><span class="line">13</span><br><span class="line">14</span><br><span class="line">15</span><br><span class="line">16</span><br><span class="line">17</span><br><span class="line">18</span><br><span class="line">19</span><br><span class="line">20</span><br><span class="line">21</span><br><span class="line">22</span><br><span class="line">23</span><br><span class="line">24</span><br><span class="line">25</span><br><span class="line">26</span><br><span class="line">27</span><br><span class="line">28</span><br><span class="line">29</span><br><span class="line">30</span><br><span class="line">31</span><br><span class="line">32</span><br><span class="line">33</span><br><span class="line">34</span><br><span class="line">35</span><br><span class="line">36</span><br><span class="line">37</span><br><span class="line">38</span><br><span class="line">39</span><br><span class="line">40</span><br><span class="line">41</span><br><span class="line">42</span><br><span class="line">43</span><br><span class="line">44</span><br><span class="line">45</span><br><span class="line">46</span><br><span class="line">47</span><br><span class="line">48</span><br><span class="line">49</span><br><span class="line">50</span><br><span class="line">51</span><br><span class="line">52</span><br><span class="line">53</span><br><span class="line">54</span><br><span class="line">55</span><br><span class="line">56</span><br><span class="line">57</span><br><span class="line">58</span><br><span class="line">59</span><br></pre></td><td class="code"><pre><span class="line"><span class="keyword">import</span> pymysql</span><br><span class="line"> </span><br><span class="line"> </span><br><span class="line"><span class="comment"># 读取数据库</span></span><br><span class="line"><span class="function"><span class="keyword">def</span> <span class="title">accept_mysql</span><span class="params">()</span>:</span></span><br><span class="line">    <span class="comment"># 连接数据库</span></span><br><span class="line">    conn = pymysql.connect(host=<span class="string">'localhost'</span>, port=<span class="number">3306</span>, user=<span class="string">'root'</span>, db=<span class="string">'person_name'</span>, charset=<span class="string">'utf8'</span>)</span><br><span class="line">    <span class="comment"># 读取男孩数据</span></span><br><span class="line">    boy_cursor = conn.cursor()</span><br><span class="line">    boy_cursor.execute(<span class="string">"SELECT * FROM boy"</span>)</span><br><span class="line">    boy_data = boy_cursor.fetchall()</span><br><span class="line">    <span class="comment"># 读取女孩数据</span></span><br><span class="line">    girl_cursor = conn.cursor()</span><br><span class="line">    girl_cursor.execute(<span class="string">"SELECT * FROM girl"</span>)</span><br><span class="line">    girl_data = girl_cursor.fetchall()</span><br><span class="line">    result = &#123;</span><br><span class="line">        <span class="string">'男'</span>: boy_data,</span><br><span class="line">        <span class="string">'女'</span>: girl_data</span><br><span class="line">    &#125;</span><br><span class="line">    <span class="keyword">return</span> result</span><br><span class="line"> </span><br><span class="line"> </span><br><span class="line"><span class="comment"># 分析读取名字</span></span><br><span class="line"><span class="function"><span class="keyword">def</span> <span class="title">read_name</span><span class="params">(words, mysql_data_boy, mysql_data_girl)</span>:</span></span><br><span class="line">    boy_word_probability = <span class="number">0</span></span><br><span class="line">    girl_word_probability = <span class="number">0</span></span><br><span class="line">    <span class="keyword">for</span> x <span class="keyword">in</span> words:</span><br><span class="line">        <span class="comment"># 男孩</span></span><br><span class="line">        <span class="keyword">for</span> i <span class="keyword">in</span> range(len(mysql_data_boy)):</span><br><span class="line">            <span class="keyword">if</span> x == mysql_data_boy[i][<span class="number">1</span>]:</span><br><span class="line">                <span class="comment"># 如果名字是两个字以上，概率相加</span></span><br><span class="line">                boy_word_probability = boy_word_probability + mysql_data_boy[i][<span class="number">2</span>]</span><br><span class="line">            <span class="comment"># 女孩</span></span><br><span class="line">        <span class="keyword">for</span> i <span class="keyword">in</span> range(len(mysql_data_girl)):</span><br><span class="line">            <span class="keyword">if</span> x == mysql_data_girl[i][<span class="number">1</span>]:</span><br><span class="line">                <span class="comment"># 如果名字是两个字以上，概率相加</span></span><br><span class="line">                girl_word_probability = girl_word_probability + mysql_data_girl[i][<span class="number">2</span>]</span><br><span class="line">    result = &#123;</span><br><span class="line">        <span class="string">'男'</span>: boy_word_probability,</span><br><span class="line">        <span class="string">'女'</span>: girl_word_probability</span><br><span class="line">    &#125;</span><br><span class="line">    <span class="keyword">return</span> result</span><br><span class="line"> </span><br><span class="line"> </span><br><span class="line"><span class="keyword">if</span> __name__ == <span class="string">'__main__'</span>:</span><br><span class="line">    raw_name = input()</span><br><span class="line">    name = raw_name[<span class="number">1</span>:]</span><br><span class="line">    <span class="comment"># 获取数据库数据</span></span><br><span class="line">    mysql_data_boy = accept_mysql()[<span class="string">'男'</span>]</span><br><span class="line">    mysql_data_girl = accept_mysql()[<span class="string">'女'</span>]</span><br><span class="line">    <span class="comment"># 分析名字</span></span><br><span class="line">    boy_probability = read_name(name, mysql_data_boy, mysql_data_girl)[<span class="string">'男'</span>]</span><br><span class="line">    girl_probability = read_name(name, mysql_data_boy, mysql_data_girl)[<span class="string">'女'</span>]</span><br><span class="line">    <span class="keyword">if</span> boy_probability &gt; girl_probability:</span><br><span class="line">        print(<span class="string">'男孩子'</span>)</span><br><span class="line">    <span class="keyword">if</span> girl_probability &gt; boy_probability:</span><br><span class="line">        print(<span class="string">"女孩子"</span>)</span><br><span class="line">    <span class="keyword">if</span> girl_probability == boy_probability:</span><br><span class="line">        print(<span class="string">"不可能！"</span>)</span><br></pre></td></tr></table></figure>

<h3 id="DEMO"><a href="#DEMO" class="headerlink" title="DEMO"></a>DEMO</h3><p> 项目DEMO地址：<a href="http://boy-girl.netlab.sunan.me/" target="_blank" rel="noopener">http://boy-girl.netlab.sunan.me</a> </p>
<p><strong>爬虫太多，服务已关闭</strong><br><em>2020.03.21</em></p>

      
    </div>
    
    
    

    

    

    

    <footer class="post-footer">
      
        <div class="post-tags">
          
            <a href="/tags/%E8%B4%9D%E5%8F%B6%E6%96%AF/" rel="tag"># 贝叶斯</a>
          
        </div>
      

      
      
      

      
        <div class="post-nav">
          <div class="post-nav-next post-nav-item">
            
              <a href="/2019/01/24/double-wordpress/" rel="next" title="双站点二级目录配置wordpress伪静态">
                <i class="fa fa-chevron-left"></i> 双站点二级目录配置wordpress伪静态
              </a>
            
          </div>

          <span class="post-nav-divider"></span>

          <div class="post-nav-prev post-nav-item">
            
              <a href="/2019/10/13/hexo-github-blog/" rel="prev" title="利用Hexo和GitHub搭建独立博客">
                利用Hexo和GitHub搭建独立博客 <i class="fa fa-chevron-right"></i>
              </a>
            
          </div>
        </div>
      

      
      
    </footer>
  </div>
  
  
  
  </article>



    <div class="post-spread">
      
    </div>
  </div>


          </div>
          


          

  



        </div>
        
          
  
  <div class="sidebar-toggle">
    <div class="sidebar-toggle-line-wrap">
      <span class="sidebar-toggle-line sidebar-toggle-line-first"></span>
      <span class="sidebar-toggle-line sidebar-toggle-line-middle"></span>
      <span class="sidebar-toggle-line sidebar-toggle-line-last"></span>
    </div>
  </div>

  <aside id="sidebar" class="sidebar">
    
    <div class="sidebar-inner">

      

      
        <ul class="sidebar-nav motion-element">
          <li class="sidebar-nav-toc sidebar-nav-active" data-target="post-toc-wrap">
            Table of Contents
          </li>
          <li class="sidebar-nav-overview" data-target="site-overview-wrap">
            Overview
          </li>
        </ul>
      

      <section class="site-overview-wrap sidebar-panel">
        <div class="site-overview">
          <div class="site-author motion-element" itemprop="author" itemscope itemtype="http://schema.org/Person">
            
              <p class="site-author-name" itemprop="name">Mofeng</p>
              <p class="site-description motion-element" itemprop="description"></p>
          </div>

          <nav class="site-state motion-element">

            
              <div class="site-state-item site-state-posts">
              
                <a href="/archives/%7C%7C%20archive">
              
                  <span class="site-state-item-count">5</span>
                  <span class="site-state-item-name">posts</span>
                </a>
              </div>
            

            
              
              
              <div class="site-state-item site-state-categories">
                
                  <span class="site-state-item-count">4</span>
                  <span class="site-state-item-name">categories</span>
                
              </div>
            

            
              
              
              <div class="site-state-item site-state-tags">
                
                  <span class="site-state-item-count">8</span>
                  <span class="site-state-item-name">tags</span>
                
              </div>
            

          </nav>

          

          
            <div class="links-of-author motion-element">
                
                  <span class="links-of-author-item">
                    <a href="https://github.com/mofengboy" target="_blank" title="GitHub">
                      
                        <i class="fa fa-fw fa-github"></i></a>
                  </span>
                
            </div>
          

          
          

          
          

          

        </div>
      </section>

      
      <!--noindex-->
        <section class="post-toc-wrap motion-element sidebar-panel sidebar-panel-active">
          <div class="post-toc">

            
              
            

            
              <div class="post-toc-content"><ol class="nav"><li class="nav-item nav-level-3"><a class="nav-link" href="#简述："><span class="nav-number">1.</span> <span class="nav-text">简述：</span></a></li><li class="nav-item nav-level-3"><a class="nav-link" href="#算法部分"><span class="nav-number">2.</span> <span class="nav-text">算法部分</span></a><ol class="nav-child"><li class="nav-item nav-level-4"><a class="nav-link" href="#从数据库中读取名字和性别"><span class="nav-number">2.1.</span> <span class="nav-text">从数据库中读取名字和性别</span></a></li><li class="nav-item nav-level-4"><a class="nav-link" href="#计算字符概率"><span class="nav-number">2.2.</span> <span class="nav-text">计算字符概率</span></a></li><li class="nav-item nav-level-4"><a class="nav-link" href="#概率数据存入数据库"><span class="nav-number">2.3.</span> <span class="nav-text">概率数据存入数据库</span></a></li></ol></li><li class="nav-item nav-level-3"><a class="nav-link" href="#训练部分完整代码"><span class="nav-number">3.</span> <span class="nav-text">训练部分完整代码</span></a></li><li class="nav-item nav-level-3"><a class="nav-link" href="#应用部分完整代码"><span class="nav-number">4.</span> <span class="nav-text">应用部分完整代码</span></a></li><li class="nav-item nav-level-3"><a class="nav-link" href="#DEMO"><span class="nav-number">5.</span> <span class="nav-text">DEMO</span></a></li></ol></div>
            

          </div>
        </section>
      <!--/noindex-->
      

      

    </div>
  </aside>


        
      </div>
    </main>

    <footer id="footer" class="footer">
      <div class="footer-inner">
        <div class="copyright">&copy; 2010 &mdash; <span itemprop="copyrightYear">2020</span>
  <span class="with-love">
    <i class="fa fa-user"></i>
  </span>
  <span class="author" itemprop="copyrightHolder">陌风小同学</span>

  
</div>








  <div class="footer-custom">ICP证：<a target="_blank" href="http://www.beian.miit.gov.cn">鲁ICP备15022835号-1</a> | <script type="text/javascript" src="https://s95.cnzz.com/z_stat.php?id=1259526004&web_id=1259526004"></script> | Hosted by GitHub Pages && Gitee Pages</div>


        







        
      </div>
    </footer>

    
      <div class="back-to-top">
        <i class="fa fa-arrow-up"></i>
        
      </div>
    

    

  </div>

  

<script type="text/javascript">
  if (Object.prototype.toString.call(window.Promise) !== '[object Function]') {
    window.Promise = null;
  }
</script>









  












  
  
    <script type="text/javascript" src="/lib/jquery/index.js?v=2.1.3"></script>
  

  
  
    <script type="text/javascript" src="/lib/fastclick/lib/fastclick.min.js?v=1.0.6"></script>
  

  
  
    <script type="text/javascript" src="/lib/jquery_lazyload/jquery.lazyload.js?v=1.9.7"></script>
  

  
  
    <script type="text/javascript" src="/lib/velocity/velocity.min.js?v=1.2.1"></script>
  

  
  
    <script type="text/javascript" src="/lib/velocity/velocity.ui.min.js?v=1.2.1"></script>
  

  
  
    <script type="text/javascript" src="/lib/fancybox/source/jquery.fancybox.pack.js?v=2.1.5"></script>
  


  


  <script type="text/javascript" src="/js/src/utils.js?v=5.1.4"></script>

  <script type="text/javascript" src="/js/src/motion.js?v=5.1.4"></script>



  
  

  
  <script type="text/javascript" src="/js/src/scrollspy.js?v=5.1.4"></script>
<script type="text/javascript" src="/js/src/post-details.js?v=5.1.4"></script>



  


  <script type="text/javascript" src="/js/src/bootstrap.js?v=5.1.4"></script>



  


  




	





  





  












  





  

  

  

  
  

  

  

  

</body>
</html>
